D0073 CNT 



1 CGACAGTCTTTAGTAGGGAAAGGAGACAAGTGCTAGCTACTGCCGCCCAAGTGGAAGGTG 6 0 



6 1 GGTGAAATTGCTCACTCTTC^CCCCACTGACGCTTTTGCGCACCTGGAAAAGCGGTTCCA 120 



121 GTTTGCGCCCGTCGCCGCCTTACAGCCGACAGGAGACCAGCGCTACCCAAGTCACGTGGG 180 



181 TTCAGCCTGCAGCTTTCTTGGCCCGAAAGGGAATTATCTATAGAGTAAGTATGCTAATCT 240 
1 M L I L 4 



..«••* 
241 TGACTAAGACTGCAGGAGTTTTTTTTAAACCATCAAAAAGGAAAGTTTATGAATTTTTAA 3 00 
5 TKTAGVFFKP SKRKVYEFLR 24 



301 GAAGTTTTAATTTTCATCCTGGAACACTATTTCTTCATAAAATAGTATTGGGAATTGAAA 360 

25 SFNFHPGTLFLHKIVLGIET 44 

• •••*• 

361 CTAGTTGTGATGAT ACAGCAGCTGCTGTGGTGGATGAAACTGGAAATGTGTTGGGAGAAG 420 

45 SCDDTAAAVVDETGNVLGEA 64 

421 CAATACATTCCCAAACTGAAGTTCATTTAAAAACAGGTGGGATTGTTCCTCCAGCAGCTC 480 

65 IHSQTEVHLKTGG IVP PAAQ 84 

481 AACAGCTTCACAGAGAAAATATTCAACGAATAGTACAAGAAGCTCTTTCTGCCAGTGGAG 54 0 

85 QLHRENIQRI VQEALSA SGV 104 

.... . • 

541 TCTCTCCAAGTGACCTCTCAGCAATTGCAACTACCATAAAACCAGGACTTGCTTTAAGCC 600 

105 SPSDLSAIATTI KPGLALSL 124 

601 TGGGAGTGGGCTTATCATTTAGCTTACAGCTGGTAGGACAGTTAAAAAAGCCATTCATTC 660 

125 GVGLSFSLQLVGQLKKPFIP 144 



661 CCATTCATCAT ATGGAGGCTC ATGCACTTACTATTAGGTTGACCAATAAAGTAGAATTTC 72 0 
145 I l^S^^B^^S^^M ALTIRLTNKVEFP 164 



721 CTTTTTTAGTTCTTTTGATTTCTGGAGGTCACTGTCTGTTGGCATTAGTTCAAGGAGTTT 78 0 
165 FLVLLI SGGHCLLALVQGVS 184 



781 CAGATTTTCTGCTTCTTGGAAAGTCTTTGGACATAGCACCAGGTGACATGCTTGACAAGG 84 0 
185 DFLLLGKSLDIAPGDMLDKV 204 



841 TGGCAAGAAGACTTTCTTTAATAAAACATCCAGAGTGCTCCACCATGAGTGGTGGGAAAG 900 
205 ARRLSLIKHPECSTMSGGKA 224 
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901 CCATAGAACATTTGGCCAAACAAGGAAATAGATTTCATTTTGACATCAAACCTCCCTTGC 960 
225 I EHLAKQGNRFHFD I KPPLH 244 



961 ATCATGCTAAAAATTGTGATTTTTCTTTTACTGGACTTCAACACGTTACTGATAAAATAA 1020 
245 HAKNCDFSFTGLQHVTDKI I 264 



1021 TAATGAAAAAGGAAAAAGAGGAAGGTATTGAGAAGGGGCAAATCCTGTCTTCAGCAGCAG 1080 
265 MKKEKEEGIEKGQILSSAAD 284 



1081 ACATTGCTGCCACAGTACAGCACACAATGGCATGTCATCTTGTGAAAAGAACACATCGGG 114 0 
285 IAATVQHTMACHLVKRTHRA 304 



1141 CTATTCTGTTTTGTAAGCAGAGAGACTTGTTACCTCAAAATAATGCAGTACTGGTTGCAT 12 00 
305 ILFCKQRDLLPQNNAVL.VAS 324 



1201 CTGGTGGTGTCGCAAGTAACTTCTATATCCGCAGAGCTCTGGAAATTTTT^ACAAACGCAA 1260 
325 GGVASNFYIRRALE ILTNAT 344 



1261 CACAGTGCACTTTGTTGTGTCCTCCTCCCAGACTATGCACTGATAATGGCATTATGATTG 132 0 
345 QCTLLCPPPRLCTDNGIMIA 364 



1321 CATGGAATGGTATTGAAAGACTACGTGCTGGCTTGGGCATTTTACATGACATAGAAGGCA 1380 
365 WNGIERLRAGLGILHDIEGI 384 



1381 TCCGCTATGAACCAAAATGTCCTCTTGGAGTAGACATATCAAAAGAAGTTGGAGAAGCTT 1440 
385 RYEPKCPLGVDI SKEVGEAS 404 



1441 CCATAAAAGTACCACAATTAAAAATGGAGATATGATTTCTGCTGTTCAAAAAAGTCCCTA 1500 
405 I KVPQLKMEI * 415 



1501 AAGGGTCTCACTCTCTGACCTCAGCTGGAGTACAGTAGCCAGATCACAACTCACTGCAAC 1560 



1561 CCTGACTTCCTGAACTCAAGAAATCCTCCTGCCTTAGCCTCTTGAATAGCCGGGACTACA 1620 



1621 GGTGTGCATGTCCATGCCCAGCCAACTTTATTTCTATTTTTTGTAGAGACAGGCTCTTGC 1680 



1681 CATGTTGCCCGGGCTGGTCCTGAACTGCTGAATTCAAGTGATCCTCCCACCTTGGCCTCC 1740 



1741 AGAAGTGCTGGGATTATGGGTGTGAGCCACCATGCCTAGCCAAAATGTTTCTTAAGGTAT 1800 



1801 ACATTTTGGGTCTTAGAAGACTTATACATTTGTAATATTTATTACTAAATATCTCAAAGT 1860 



1861 ATTACAATAAATGTTACCATGTGAGCTACTTTGAATCAGGCTTCTTGCACACCAATTTAA 1920 
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1921 AAATGTTAACTCTTGATATATACACTAGTTATACCACTCATGTCAGTCAATAAATTTTAA 1980 

1981 GGTTTAAGTGCAGGCCTTTGTTTACAGAAATCCTAATTTTTTGAAACCATAACTCTGACC 204 0 

2041 TGACACTAAATTCCTGTAGACATGCTAAGGAAAATCTGCTTAGTATCGAGATCAAGAACT 2100 

2101 TCCATTCAAAAAGATTATTCAGTTATGTTATTTGCATATTACCATTGTTAAAAATAAAAA 216 0 
2161 AATTTTTAAAAGATGAAAAAAAAAAAAAAAAAAAAAA 2197 
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251 300 
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mpl 1 MLILTKTAGVFFKPSKRKNnfEFLRSFNFHPGTLFLH^ 

MLILTKTAGVFFKPSKRKVT^ 

MLILTKTAGVFFKPSKRKVYEFLRSFNFHPGTLFLffi 
AC013468_6 -9850 acataaagggttactaaagtgttaatatccgactccsaagtgagaatgga 

ttt'tcaccgtttaccagataattggt^sitacgct'ttaa^ttgtecggaao 
gacg-bgtaatttaaaagattataatttt.ttaaatt.taaagatatt;ttta 



mpl 50 AAAWDETGNVLGEAIHSQTEVHL 

AAAVVDETGNVLGEAIHSQTEVHL 

AAAWDE TGNVLGEAI HSQTEVHL K:K[aaa] 
AC013468_6 -9703 gggggggagagtgggactcaggctAAGTAAGTA Intron 1 

cccttaacgattgactacacatat <2 [9629 : 3771] 

attggtatatggaaaatcatatta 



mpl 74 TGGrVPPAAQQLHRENlQRIVQEALSASGVS PSDLSAIATT IKP6 

TGG IVP PAAQQLHRENIQRXVQEALSAS GVS PSDLSAIATT IKPG 
TGGrVPPAAQQLHRENIQRrVQEALSASGVSPSDLSAIATTIKPG 

AC 01 3 4 6 8_6 -3773 CAGAaggagccggccccagaaccagcggctgaggt cagctgagaaaacg 

-2> cggttccccaatagaatagttaactccggtccgatcctccctacg 
atgtttaatagtcaattaaaaaatttctactatccaatatcaaaa 



mpl 120 ZJOiSIX3VGI.SFSLQLVGQLKKPFXPXHHMEAHAI.TXRL 

LALSLGVGLSFSLQLVGQLKKPFIPIHHMEAHALTIRLTNKVEFPET.VL 
LALSLGVGLSFSLQLVGQLKKPF I P I HHMEAHALT IRLTNKVEFPFLVL 

AC013468_6 -3634 cgtacgggtttatccggctaactacaccaggcgcaaataaaggtcttgc 

tctgtgtgtctgtattgataacttctaatacactctgtcaatatctttt 
ttacgagcaatcaggaagaagactctttggttatfctggctaaatttatt 



mpl 169 LX SGGHCLLALVQGVSDFLLLGKSLD XAPGDMLDK 

L I SGGHCLIAliVQGV SDFT J J iGKSLD IAPGDMIJDK 
L I SGGHCLLALVQGVSDFTiT J iGKSLD IAPGDMLDK 

AGO 1346 8__ 6 - 3 4 8 7 ta tggc tc tg tgcgg tgtcccga t tgagcggacga 

ttcggagttcttagtcattttgactatccgattaa 
gttatctggaataatattgttagtgcaaatcgtcg 



mpl 204 VARRLSLIKHPECSTMSGGKAIEHLA 

VARRLSLIKHPECSTMSGGKAIEHLA 
VARRLSLIKHPECSTMSGGKAIEHLA 

AC013468_6 -3382 GTAATTA Intron 2 TAGggaacttaaccgttaaaggagagctg 

<0 [3382 : 2556] -0>tcggtcttaacagcctgggactaatc 

gaaattaaatagcccgttgacaatgc 



mpl 230 KQGNRFHFDIKPPLHHAKNCDFSFTGLQHVTDKI XMKKEKEE 

KQGNRFHFDIKPPLHHAKNCDFSFTGLQHVTDKI XMKKEKEE 
KQGNRFHFD XKPPLHHAKNCDFS FTGLQHVTDKI XMKKEKEE 

AC013468_6 -2477 acgaatctgaacctccgaatgtttagcccgagaaaaaagagg 

aagagtatatacctaacaagatctcgtaatcaatttaaaaaa 
aaatatttccatcgtttatttttttatactttaaagagaaga 
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*Pl 272 IEKGQILSSAADIAATVQHTMAC 

IEKGQILSSAADIAATVQHTMAC 
6 : 6 [ggt ] IEKGQILSSAADIAATVQHTMAC 
AC013468_6 -2351 GGTATATT Intron 3 CAGGTagagcacttgggaggagccaagt 

<1 [2350 : 2275] -1> taagattccccatccctaactcg 

tgggacgtaaacttcaagcagat 

mpl 296 HLVKRTHRAILFCKQRDLIjPQNNAVXi 

HLVKRTHRAILFCKQRDLLPQNNAVL 

HLVKRTHRAILFCKQRDLLPQNHAVL 
AC013468__6 -2203 ccgaaaccgacttacagttccaaggcGTAAGTT Intron 4 CAG 

attagcagctttgaagattcaaactt<0 [2125 : 11 90 ] -0> 

ttgaaatgttgttggacgatattaag 

mpl 322 VASGGVASNFXTRRALE ILTNATQCTLXiCPPPRLCTDNGIMIA 

VASGGVASNFYIRRAIiE ILTNATQCTLLCPPPRIiCTDNGIMIA 
VASGGVASNFY IRRALE ILTNATQCTLLCPPPRLCTDNGIMIA 

AC 01 346 8_6 - 1 1 8 9 gg tggggaa t tacagcga taagac ta 1 1 tccca c tagagaaag 

tccggtcgatatggctattcaccagcttgcccgtgcaagtttc 
tatttcatcctccatgataataagctggtttcaactttctgta 

m Pl 365 NG IERLRAGLGIIiHD XEGXRYE P 

NGXEKLRAGIfGXIiHD IE G XRYE P 
W:W[tgg] NGIERIjRAGIiGILHDIEGIRYEP 
AC013468_6 -1060 TGGTAAGCC Intron 5 TAGGagagaccggtgatcgaggactgc 

<2 [1058 : 935] -2> agtagtgcgtgttaatagtgaac 

tttaaattcgctatcaaccctaa 



mpl 

AC013468 6 



389 K 
K 
K 

-864 a 
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11641265 1 MLILTKTAGVTTFKPSKRKVYEFIJ^FNra 

MLILTKTAGVFFKPSKRKVYEFLRSFNFHP TLFLHKIVLGIETSCDDT 
MLILTKTAGVFFKPSKRKV^TEFIiRSFNFHPGTLFIJIKTVIjGIETSCDDT 

AC013468_6 -9850 acataaagggttactaaagtgttaatatccgactccaagtgagaatgga 

ttttcaccgtttaccagataattggtatacgctttaatttgtacggaac 
gacgtgtaatttaaaagattataattttttaaatttaaagatattttta 



11641265 50 AAAVVDETGNVLGEAIHSQTEVHL 

AAAWDE TGNVLGEAIHSQTEVHL 

AAAVVDETGNVIiGEAIHSQTEVHI, K : K [ aaa ] 

AC013468_6 -9703 gggggggagagtgggactcaggctAAGTAAGTA Intron 1 

cccttaacgattgactacacatat <2 [9629 • 3771 J 

attggtatatggaaaatcatatta 



11 64 12 6b 74 TGGIVPPAAQQLHRENIQRIVQEALSASGVSPSDLSAXATTIKPG 

TGGIVPPAAQQLHRENIQRIVQEALSAS GVS PSDLSAIATT IKPG 
TGGIVPPAAQQLHRENIQRIVQEALSASGV'SPSDLSAIATTIKPG 

AC013468_6 -3773 CAGAaggagccggccccagaaccagcggctgaggtcagctgagaaaacg 

-2> cggttccccaatagaatagttaactccggtccgatcctccctacg 
atgtttaatagtcaattaaaaaatttctactatccaatatcaaaa 



11641265 120 LALSLGVGLSFSLQLVGQLKKPFIPIHHMEJ^^ 

IJ^SLGVGLSFSI^LVGQI^aCPFIPIHHMEAHALTIKL 
IJ^SLGVGLSFSLQIiVGQIiKKPFIPIHHMEAHALTIRLTNKVEFPEXVL 

AC013468_6 -3634 cgtacgggtttatccggctaactacaccaggcgcaaataaaggtcttgc 

tctgtgtgtctgtattgataacttctaatacactctgtcaatatctttt 
ttacgagcaatcaggaagaagactctttggttatttggctaaatttatt 



11641265 169 LI SGGHCIJ^AIiVQGVSDFLIJLGKSLDIAPGDMLDK 

LIS GGH CLLALiVQGVSDFLIxLGKS LD IAPGDMLDK 
L I SGGHCLLALVQGVSDFLLLGKSLD IAPGDMLDK 

AC013468_6 -3487 tatggctctgtgcggtgtcccgattgagcggacga 

ttcggagttcttagtcattttgactatccgattaa 
gttatctggaataatattgttagtgcaaatcgtcg 



11641265 204 VARKLSLIKHPECSTMSGGKAIEHLA 

VARKLSLIKHPECSTMSGGKAIEHLA 
VARKLSLIKHPECSTMSGGKAIEHLA 

AC013468_6 -3382 GTAATTA Intron 2 TAGggaacttaaccgttaaaggagagctg 

<0 [3382 : 2556] -Otcggtcttaacagcctgggactaatc 

gaaattaaatagcccgttgacaatgc 

11641265 230 KQGNRFHFDIKPPLHHAKNCDFSFTGLQHVTDKI IMKKEKEEGIFLISK 

KQO^RFHFDIKPPLHHAKNCDFSFTGLQHVTDKI IMKKEKEEGIFLISK 
KQGNRFHFDIKPPLHHAKNCDFSFTGLQHVTDKI IMKKEKEEGIFLISK 

AC0134 68_6 -2477 acgaatctgaacctccgaatgtttagcccgagaaaaaagagggatcaaa 

aagagtatatacctaacaagatctcgtaatcaatttaaaaaagrttttga 
aaatatttccatcgtttatttttttatactttaaagagaagatatatta 

FRAME SHIFT HERE 
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11641265 279 VEQ IN I PGLCLKIAAHFCRYEKGQ I LS SAAD IAATVQHTMACHLVKRTH 

VEQINIPGLCLKIAAHFCRY KGQILS SAAD IAATVQHTMACHLVKRTH 
VEQINIPGLCLKIAAHFCRY ! KGQ I LS SAAD IAATVQHTMACHLVKRTH 

AGO 1346 8_6 -2330 ggcaaacgt tcaaggc t ta t4 agcac t tgggaggagccaagtccgaaac 

taatatcgtgtatccatgga agattccccatccctaactcgattagca 
tagatttagcaaatttccgt ggacgtaaacttcaagcagatttgaaat 



11641265 328 RAILFCKQRDLLPQNNAVL VASG6VA 

RAILFCKQRDLLPQNNAVL VASGGVA 
RAILFCKQRDLLPQNNAVL VASGGVA 

AC013468_6 -2182 cgacttacagttccaaggcGTAAGTT Intron 3 CAGggtgggg 

gctttgaagattcaaactt<0 [2125 : 1190 ] -0>tccggfcc 

gtfcgtfcggacgatattaag tatttca 



11641265 354 SNFYIRRALE ILTNATQCTLLCPPPRLCTDNGIMIA 

SNFYIRRALE ILTNATQCTLLCPPPRLCTDNGIMIA 
SNFYIRRALE ILTNATQCTLLCPPPRLCTDNGIMIA 

AC013468__6 -1168 aattacagcgataagactatttcccactagagaaag 

gatatggctatfccaccagcttgcccgtgcaagtttc 
tccfcccatgataataagctggtttcaactttctgta 



11641265 390 NGIERLRGGLGILHDIEGIRYEP 

NGIERLR GLGILHDIEGIRYEP 
W : W [ tgg] NGIERLRAGLGILHD IEGIRYE P 

AC013468_6 -1060 TGGTAAGCC Intron 4 TAGGagagaccggtgatcgaggactgc 

<2 [1058 : 935] -2> agtagtgcgtgttaatagtgaac 

tttaaattcgctatcaaccctaa 



11641265 414 K 

K 
K 

AC013468 6 -864 a 



FIG. 7B 
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Protein 


Genbank 
ID 


Identities 


Similarities 


Arabidopsis O-sialoglycoprotein 
endopeptidase protein 


gi 12583127 


30.8% 


36% 


Caenorhabditis glycoproteinase 
family member protein 


gi 17495111 


26.6% 


41% 


Thermotoga secreted 
metalloendopeptidase Gcp 
protein 


gi 14980638 


27.2% 


39% 


Helicobacter O-sialoglycoprotein 
endopeptidase GCP_HELPY 
protein 


gi|2499846 


22.5% 


34% 



FIG. 8 
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gi 



gi 



gi 



gi 



gi 



gi 



gi 
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gi 



gi 
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gi 



MP-l 
11641264 



MP-l 
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MP-l 
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MP-l 
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MP-l 
11641264 



MP-l 
11641264 



MP-l 
11641264 



MP-l 
11641264 



MP-l 
11641264 



(1) 
(1) 



(51) 
(1) 



(101) 
(1) 



(151) 
(1) 



(201) 
(1) 



(251) 
(44) 



(301) 
(94) 



(351) 
(144) 



(401) 
(194) 



(451) 
(244) 



(501) 
(294) 



(551) 
(344) 



(601) 
(394) 



(651) 
(444) 



(701) 
(494) 



(751) 
(544) 



(801) 
(594) 



1 50 
CGACAGTCTTTAGTAGGGAAAGGAGACAAGTGCTAGCTACTGCCGCCCAA 



51 100 
GTGGAAGGTGGGTGAAATTGCTCACTCTTCACCCCACTGACGCTTTTGCG 



101 150 
CACCTGGAAAAGCGGTTCCAGTTTGCGCCCGTCGCCGCCTTACAGCCGAC 



151 200 

AG GAG AC C AG CG CTAC CC AAG TC ACGTG GGTTC AGC CTG C AGCTTTCTTG 



201 

GCCCGAAAG 
CA 

251 



250 



GGAATTATCTATAGAGTAAGTATGCTAATCTTGACTAAGAC 
GGAATTATCTATAGAGTAAGTATGCTAATCTTGACTAAGAC 



300 



TGCAGGAGTTTTTTTTAAACCATCAAAAAGGAAAGTTTATGAATTTTTAA 
TGCAGGAGTTTTTTTTAAACCATCAAAAAGGAAAGTTTATGAATTTTTAA 



301 



350 



GAAGTTTTAATTTTCATCCTGg 


AACACTATTTCTTCATAAAATAGTATTG 


GAAGTTTTAATTTTCATCCTGg 


AACACTATTTCTTCATAAAATAGTATTG 


351 


400 


GGAATTGAAACTAGTTGTGATGATACAGCAGCTGCTGTGGTGGATGAAAC 
GGAATTGAAACTAGTTGTGATGATACAGCAGCTGCTGTGGTGGATGAAAC 


401 


450 


TGGAAATGTGTTGGGAGAAGCAATACATTCCCAAACTGAAGTTCATTTAA 


TGG AAATG TG TTGGG AG AAGC A 


ATAC ATTCCC AAAC TGAAGTTC ATTTAA 


451 


500 


AAACAGGTGGGATTGTTCCTCCAGCAGCTCAACAGCTTCACAGAGAAAAT 


AAACAGGTGGGATTGTTCCTCC 


AGCAGCTCAACAGCTTCACAGAGAAAAT 


501 


550 


ATTCAACGAATAGTACAAGAAG 


CTCTTTCTGCCAGTGGAGTCTCTCCAAG 


ATTCAACGAATAGTACAAGAAG 


CTCTTTCTGCCAGTGGAGTCTCTCCAAG 


551 


600 


TGACCTCTCAGCAATTGCAACTACCATAAAACCAGGACTTGCTTTAAGCC 


TGACCTCTCAGCAATTGCAACT 


ACCATAAAACCAGGACTTGCTTTAAGCCj 


601 


650 


TGGGAGTGGGCTTATCATTTAGCTTACAGCTGGTAGGACAGTTAAAAAAG 


TGGGAGTGGGCTTATCATTTAG 


CTTACAGCTGGTAGGACAGTTAAAAAAG 


651 


700 


CCATTCATTCCCATTCATCATATGGAGGCTCATGCACTTACTATTAGGTT 


CCATTCATTCCCATTCATCATATGGAGGCTCATGCACTTACTATTAGGTT 


701 


750 


GACCAATAAAGTAGAATTTCCTTTTTTAGTTCTTTTGATTTCTGGAGGTC 


GACCAATAAAGTAGAATTTCCTTTTTTAGTTCTTTTGATTTCTGGAGGTC 


751 


800 


ACTGTCTGTTGGCATTAGTTCAAGGAGTTTCAGATTTTCTGCTTCTTGGAI 


ACTGTCTGTTGGCATTAGTTCA 


AGGAGTTTCAGATTTTCTGCTTCTTGGA 


801 


850 



AAGTCTTTGGACATAGCACCAGGTGACATGCTTGACAAGGTGGCAAGAAG 
AAGTCTTTGGACATAGCACCAGGTGACATGCTTGACAAGGTGGCAAGAAG 



FIG. 1 0A 
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MP-l 
gi|H641264 



MP-l 
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MP-l 
gi (11641264 



MP-l 
gi 1 11641264 



ACTTTCTTTAATAAAACATCCAGAGTGCTCCACCATGAGTGGTGGGAAAG 
ACTTTCTTTAATAAAACATCCAGAGTGCTCCACCATGAGTGGTGGGAAAG 



CCATAGA g CATTTGGCCAAACAAGGAAATAGATTTCATTTTGACATCAAA 
CCATAGAffiCATTTGGCCAAACAAGGAAATAGATTTCATTTTGACATrAA A 



CCTCCCTTGCATCATGCTAAAAATTGTGATTTTTCTTTTACTGGACTTCA 
CCTC CCTTGCATCATGCTAAAAATTGTGATTTTTCTTTTACTGGACTTCA 



851 900 

(851) 
(644) 

901 9 5 o 

(901) 
(694) 

951 1000 

(951) 
(744) 

1001 1050 

(794) ttoftfaMnbil^ 

1051 1100 

(1049) 

(844) TTCTAATTAGTAAAGTTGAACAGATAAATATTCCTGGATTGTGCCTAAAA 

1101 H50 

(1050) 

(894) ATAGCTGCTCATTTCTGCAGGTAE 

1151 1200 

(1076) 
(944) 

1201 1250 

(112 6) 
(994) 

1251 1300 

(1176) 
(1044) 

1301 1350 

(1226) 
(1094) 

1351 1400 

(1276) - — 

(1144) 

1401 1450 

(1326) 
(1194) 

1451 1500 

(1376) 
(1244) 

1501 1550 

(1426) 
(1294) 

1551 1600 
(147 6) gjyjgjgjgggj^^ agp 
(1344) ImwmyKWMiMwiMigBMM^ 

1601 1650 
(1526) TGGAGTACAGTAGCCAGATC AC AACTCACTGC AACCCTGACTTCCTG AAC 
(1388) 

1651 1700 

(1576) tcaagaaatcctcctgccttagcctcttgaatagccgggactacaggtgt 

(1388) 

FIG. 10B 



r G AG AAGGGG C AAAT C CT GTC TT C AG C 
PGAGAAGGGGCAAATCCTGTCTTCAGC 



AGCAGACATTGCTGCCACAGTACAGCACACAATGGCATGTCATCTTGTGA 
AGCAGACATTGCTGCCACAGTACAGCACACAATGGCATGTCATCTTGTGA 



AAAGAACACATCGGGCTATTCTGTTTTGTAAGCAGAGAGACTTGTTACCT 
AAAGAACACATCGGGCTATTCTGTTTTGTAAGCAGAGAGACTTGTTACCT 



:aaaataatgcagtactggttgcatctggtggtgtcgcaagtaacttcta 

rAAAATAATGCAGTACTGGTTGCATCTGGTGGTGTCGCAAGTAACTTCTA 



tatccgcagagctctggaaattttaacaaacgcaacacagtgcactttgt 



TATCCGCAGAGCTCTGGAAATTTTAACAAACGCAACACAGTGCACTTTGT 



TGTGTCCTCCTCCCAGACTATGCACTGATAATGGCATTATGATTGCATGG 
TGTGTCCTCCTCCCAGACTATGCACTGATAATGGCATTATGATTGCATGG 



AATGGTATTGAAAGACTACGTG g TGGCTTGGGCATTTTACATGACATAGA 
AATGGTATTGAAAGACTACGTGg TGGCTTGGGCATTTTACATGACATAGA 



AGGCATCCGCTATGAACCAAAATGTCCTCTTGGAGTAGACATATCAAAAG 
■A.GGCATCCGCTATGAACCAAAATGTCCTCTTGGAGTAGACATATCAAAAG 



AAGTTGGAGAAGCTTCCATAAAAGTACCACAATTAAAAATGGAGATATGA 
AAGTTGGAGAAGCTTCCATAAAAGTACCACAATTAAAAATGGAGATATGA 
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MP-1 
git 11641264 



MP-1 
gi 1 11641264 



MP-1 
gi 1 11641264 



MP-1 
gi 111641264 



MP-1 
gi 1 11641264 



MP-1 
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MP-1 
gi 1 11641264 



MP-1 
gi 111641264 



MP-1 
gi 1 11641264 



MP-1 
gi 1 11641264 



MP-1 
gi|11641264 



MP-1 
gil 11641264 



1701 1750 
(1626) GCATGTCCATGCCCAGCCAACTTTATTTCTATTTTTTGTAGAGACAGGCT 
(1388) 

1751 1800 
(1676) CTTGCCATGTTGCCCGGGCTGGTCCTGAACTGCTGAATTCAAGTGATCCT 
(1388) 

1801 1850 
(1726) CCCACCTTGGCCTCCAGAAGTGCTGGGATTATGGGTGTGAGCCACCATGC 
(1388) 

1851 1900 
(1776) CTAGCCAAAATGTTTCTTAAGGTAT ACATTTTGGGTCTT AGAAGACTTAT 
(1388) 

1901 1950 
(1826) ACATTTGTAATATTTATTACTAAATATCTCAAAGTATTACAATAAATGTT 
(1388) 

1951 2000 
(1876) ACCATGTGAGCTACTTTGAATCAGGCTTCTTGCACACCAATTTAAAAATG 
(1388) 

2001 2050 
(1926) TTAACTCTTGATATATACACTAGTTATACCACTCATGTCAGTCAATAAAT 
(1388) 

2051 2100 
(1976) TTTAAGGTTTAAGTGCAGGCCTTTGTTTACAGAAATCCTAATTTTTTGAA 
(1388) 

2101 2150 
(2026) ACCATAACTCTGACCTGACACTAAATTCCTGTAGACATGCTAAGGAAAAT 
(1388) 

2151 2200 
(2076) CTGCTTAGTATCGAGATCAAGAACTTCCATTCAAAAAGATTATTCAGTTA 
(1388) 

2201 2250 
(2126) TGTTATTTGCATATTACCATTGTTAAAAATAAAAAAATTTTTAAAAGATG 
(1388) 

2251 2272 
(2176) AAAAAAAAAAAAAAAAAAAAAA 
(1388) 
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